@booklet{RePr,
    title   = {{Overview of Reanalysis Project}},
    howpublished = "\url{http://climatedataguide.ucar.edu/category/data-set-variables/reanalysis}"
}

@booklet{WRF,
year = {2012},
title = {{WRF Model}},
howpublished = "\url{http://www.wrf-model.org/index.php}",
}

@booklet{ReDe,
    title   = {{Reanalysis}},
    howpublished = "\url{http://www.reanalysis.org}"
}

@booklet{OrEx,
    title   = {{Oracle Exadata Database Machine}},
    howpublished = "\url{http://www.oracle.com/us/products/database/exadata/database-machine-x3-8/overview/index.html}"
}

@INPROCEEDINGS{BGAS, 
author = {Blake G. Fitch and Alex Rayshubskiy and  T.J. Chris Ward, Mike Pitman and Bernard Metzler and Heiko J. Schick and Benjamin Krill and Peter Morjan and Robert S. Germain},
title = {{Blue Gene Active Storage}},
year = {2010},
booktitle={HEC FSIO R\&D Workshop '10},
}

@INPROCEEDINGS{LSKO09,
	author ={G. F. Lofstead and K. Schwan and S. Klasky and R.A. Oldfield},
  title ={Advanced I/O for Large-Scale Scientific Applications},
  booktitle = {Sandia Tech Report SAND2009-7763},
  year ={2009}
}

@INPROCEEDINGS{CCSG2012,
  author =       {Y. Chen and C. Chen and X.-H. Sun and W. D. Gropp and R. Thakur},
  title =        {A Decoupled Execution Paradigm for Data-Intensive High-End Computing},
  booktitle =    {In the Proc. of the IEEE International Conference on Cluster Computing 2012 (Cluster'12)},
  year =         {2012}
}

@article{Kalla:MICRO04,
    author="R. Kalla and B. Sinharnoy and J. Tendler",
    title={{IBM Power5 Chip: A Dual-Core Multithreaded Processor}},
    journal="IEEE Micro",
    volume="24",
    number="2",
    year="2004"
}

@techreport{darpa08:report,
    title        = {{Exascale Computing Study: Technology Challenges in Achieving Exascale Systems}},
    author      = {P. Kogge and K. Bergman and S. Borkar etc.},
    institution = {DARPA IPTO},
    year        = {2008},
    type        = {Tech. Rep. DARPA-2008-13}
}

@inproceedings{Gioiosa:vlsi-soc10,
    author="Roberto Gioiosa",
    title={{Towards Sustainable Exascale Computing}},
    booktitle={IEEE/IFIP VLSI System on Chip Conference (VLSI-SoC)},
    year={2010}
}

@inproceedings{lowenthal_ppopp06,
    author = {Robert Springer and David K. Lowenthal and Barry Rountree and Vincent W. Freeh},
    title = {{Minimizing Execution Time in MPI Programs on an Energy-Constrained, Power-Scalable Cluster}},
    booktitle  = {Proceedings ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming (PPoPP)},
    year = {2006}
}

@inproceedings{Freeh_ipdps05,
    author = {Vincent W. Freeh and Feng Pan and Nandini Kappiah and David K. Lowenthal and Rob Springer},
    title = {{Exploring the Energy-Time Tradeoff in MPI Programs on a Power-Scalable Cluster}},
    booktitle = {Proceedings of International Parallel and Distributed Processing Symposium (IPDPS)},
    year = {2005}
}

@inproceedings{Freeh_ppopp05,
    author = {Vincent W. Freeh and David K. Lowenthal},
    title = {{Using Multiple Energy Gears in MPI Programs on a Power-Scalable Cluster}},
    booktitle = {Proceedings of ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming (PPoPP)},
    year = {2005}
}

@inproceedings{nandini:sc05,
    author="Nandini Kappiah and Vincent Freeh and David Lowenthal",
    title= {{Just In Time Dynamic Voltage Scaling: Exploiting Inter-Node Slack to Save Energy in MPI Programs}},
    booktitle = {Proceedings of the 2005 ACM/IEEE Conference on Supercomputing},
    year="2005"
}

@inproceedings{Barry_sc07,
    author = {Barry Rountree and David K. Lowenthal and Shelby Funk and Vincent W. Freeh and Bronis R. de Supinski and Martin Schulz},
    title = {{Bounding Energy Consumption in Large-scale MPI Programs}},
    booktitle = {Proceedings of the the ACM/IEEE International Conference on High-Performance Computing, Networking, and Storage (Supercomputing)},
    year = {2007}
}

@inproceedings{Barry_ics09,
    author = {Barry Rountree and David K. Lowenthal and Bronis R. de Supinski and Martin Schulz and Vincent W. Freeh and Tyler Bletsch},
    title ={{Adagio: Making DVS Practical for Complex HPC Applications}},
    booktitle = {Proceedings of the 23rd international conference on Supercomputing (ICS)},
    year = {2009}
}

@inproceedings{dong_gpu_consolidation,
    author = {Dong Li and Surendra Byna and Srimat Chakradhar},
    title = {{Energy-Aware Workload Consolidaton on GPU}},
    booktitle = {International Workshop on Scheduling and Resource Management for Parallel and Distributed Systems},
    year = {2011}
}

@inproceedings{runtime_proc_selec,
    author = {Hiroyuki Takizawa and Katuto Sato and Hiroaki Kobayashi},
    title = {{SPRAT: Runtime Processor Selection for Energy-aware Computing}},
    booktitle = {International Workshop on Automatic Performance Tuning},
    year = {2008}
}

@inproceedings{kernel_fusion,
    author = {Guibin Wang and Yisong Lin and Wei Yi},
    title = {{Kernel Fusion: An Effective Method for Better Power Efficiency on Multithreaded GPU}},
    booktitle = {Proceedings of the 2010 IEEE/ACM International Conference on Green Computing and Communications},
    year = {2010}
}

@inproceedings{kernel_fusion2,
    author = {Guibin Wang},
    title = {{Coordinate Strip-mining and Kernel Fusion to Lower Power Consumption on GPU}},
    booktitle = {Proceedings of Design, Automation and Test in Europe Conference and Exhibition},
    year = {2011}
}

@inproceedings{workload_dist,
    author = {Guibin Wang and Xiaoguang Ren},
    title = {{Power-Efficient Work Distribution Method for CPU-GPU Heterogeneous System}},
    booktitle = {International Symposium on Parallel and Distributed Processing with Applications},
    year = {2010}
}

@inproceedings{Matt:PACT08,
    author     = {Matthew Curtis-Maury and Ankur Shah and Filip Blagojevic and Dimitrios S. Nikolopoulos and Bronis R. de Supinski and Martin Schulz},
    title      = {{Prediction Models for Multi-dimensional Power-Performance Optimization on Many Cores}},
    booktitle  = {Proceedings of the 17th International Conference on Parallel Architectures and Compilation Techniques (PACT)},
    year       = {2008}
}

@article{Matt:TPDS,
    author    = {Matthew Curtis-Maury and Filip Blagojevic and Christos D. Antonopoulos and Dimitrios S. Nikolopoulos},
    title     = {{Prediction-Based Power-Performance Adaptation of Multithreaded Scientific Codes}},
    journal   = {{IEEE Transactions on Parallel and Distributed Systems (TPDS)}},
    year      = {2008}
}

@inproceedings{Matt:ICS06,
    author     = {Matthew Curtis-Maury and James Dzierwa and Christos D. Antonopoulos and Dimitrios S. Nikolopoulos},
    title      = {{Online Power-Performance Adaptation of Multithreaded Programs using Event-Based Prediction}},
    booktitle  = {Proceedings of the 20th ACM International Conference on Supercomputing (ICS)},
    year       = {2006},
}

@inproceedings{Li_hpca06,
    title = {{Dynamic Power-Performance Adaptation of Parallel Computation on Chip Multiprocessors}},
    author = {Jian Li and Jose F.Martinez},
    booktitle = {Proceedings of Symposium on High-Performance Computer Architecture (HPCA)},
    year = {2006}
}

@inproceedings{dong_ipdps10,
    title = {{Hybrid MPI/OpenMP Power-Aware Computing}},
    author = {Dong Li and Bronis de Supinski and Martin Schulz and Dimitrios Nikolopoulos and Kirk Cameron},
    booktitle = {Proceedings of the International Parallel and Distributed Processing Symposium},
    year = {2010}
}

@inproceedings{dong_sc10,
    title = {{Poster: Model-based Hybrid MPI/OpenMP Power-Aware Computing}},
    author = {Dong Li and Bronis de Supinski and Martin Schulz and Dimitrios Nikolopoulos and Kirk Cameron},
    booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis},
    year = {2009}
}

@article{dong_tpds,
    title = {{Strategies for Energy Efficient Resource Management of Hybrid Programming Models}},
    author = {Dong Li and Bronis de Supinski and Martin Schulz and Dimitrios Nikolopoulos and Kirk Cameron},
    journal = {IEEE Transaction on Parallel and Distributed Systems},
    year = {2012}
}

@article{opari,
    title = {{Design and Prototype of a Performance Tool Interface for OpenMP}},
    author = {Bernd Mohr and Allen Malony and Sameer Shende and Felix Wolf},
    journal = {The Journal of Supercomputing},
    year = {2002}
}

@inproceedings{partha_asplos08,
    title = {{No ''Power`` Struggles: Coordinated Multi-level Power Management for the Data Center}},
    author = {Ramya Raghavendra and Parthasarathy Ranganathan and Vanish Talwar and Zhikui Wang and Xiaoyun Zhu},
    booktitle = {Architectural Support for Programming Languages and Operating Systems},
    year = {2008}
}

@inproceedings{mem_processor_ics11,
    title = {{Coordinating Processor and Main Memory for Efficient Server Power Control}},
    author = {Ming Chen and Xiaorui Wang and Xue L},
    booktitle = {International Conference on Supercomputing},
    year = {2011}
}

@inproceedings{mem_processor_ics05,
    title = {{A Performance-Conserving Approach for Reducing Peak Power Consumption in Server Systems}},
    author = {Wes Felter and Karthick Rajamani and Tom Keller and Cosmin Rusu},
    booktitle = {International Conference on Supercomputing},
    year = {2005}
}

@inproceedings{cache_power,
    title = {{Cache Decay: Exploiting Generational Behavior to Reduce Cache Leakage Power}},
    author = {S. Kaxiras and Z. Hu and M. Martonosi},
    booktitle = { International Symposium on Computer Architecture },
    year = {2001}
}

@inproceedings{network_power,
    title = {{Orion: A Power-Performance Simulator for Interconnection Networks}},
    author = {Hang-Sheng Wang and Xinping Zhu and Li-Shiuan Peh and Sharad Malik},
    booktitle = {Orion: A PowerPerformance Simulator for Interconnection Networks},
    year = {2002}
}

@inproceedings{disk_power,
    booktitle = {USENIX Conference on File and Storage Technologies},
    author = {John Zedlewski and Sumeet Sobti and Nitin Garg and Fengzhou Zheng and Arvind Krishnamurthy and Randolph Wang},
    title = {{Modeling Hard-Disk Power Consumption}},
    year = {2003}
}

@inproceedings{power7,
    booktitle = {International Symposium on High Performance Computer Architecture},
    author = {Malcolm Ware and Karthick Rajamani and Michael Floyd and Bishop Brock},
    title = {{Architecting for Power Management: The IBM POWER7 Approach}},
    year = {2010}
}

@inproceedings{intel_scc,
    booktitle = {International Conference for High Performance Computing, Networking, Storage and Analysis},
    author = {Timothy G. Mattson and Rob F. Van der Wijngaart and Michael Riepen and Thomas Lehnig and Paul Brett and
	Werner Haas and Patrick Kennedy and Jason Howard and Sriram Vangal and Nitin Borkar and Greg Ruhl and Saurabh Dighe},
    title = {{The 48-core SCC Processor: the Programmer's View}},
    year = {2010}
}

@inproceedings{gpu_dvfs,
    title = {{Power and Performance Characterization of Computational Kernels on the GPU}},
    author = {Yang Jiao and Heshan Lin and Paven Balaji and Wu-chun Feng },
    booktitle = {International Conference on Green Computing and Communications (GreenCom 2010)},
    year = {2010}
}

@inproceedings{power_pact08,
    booktitle = {International Conference on Parallel Architectures and Compilation Techniques },
    author = {T. Horvath and K. Skadron},
    title = {{Multi-mode Energy Management for Multi-tier Server Clusters}},
    year = {2008}
}

@inproceedings{correlation_pact08,
    booktitle = {International Symposium on Code Generation and Optimization},
    author = {Y. Jiang and E. Zhang and K. Tian and F. Mao and M. Gethers and X. Shen and Y. Gao},
    title = {{Exploiting Statistical Correlations for Proactive Prediction of Program Behaviors}},
    year = {2010}
}

@inproceedings{workload_dist_ipdps12,
    booktitle = {Proceedings of the International Parallel and Distributed Processing Symposium},
    author = {Thomas R. W. Scogland and Barry Rountree and Wu-chun Feng and Bronis R. de Supinski},
    title = {{Heterogeneous Task Scheduling for Accelerated OpenMP}},
    year = {2012}
}

@inproceedings{seyong_sc10,
    booktitle={International Conference for High Performance Computing, Networking, Storage and Analysis},
    author={Seyong Lee and Rudolf Eigenmann},
    title = {{ OpenMPC: Extended OpenMP Programming and Tuning for GPUs}},
    year = {2010}
}

@inproceedings{hmpp_gpgpu07,
    booktitle={International Workshop on General Purpose Processing Using GPUs},
    author={Romain Dolbeau and St�phane Bihan and Fran�ois Bodin},
    title = {{HMPP: A Hybrid Multi-core Parallel Programming Environment}},
    year = {2007}
}

@inproceedings{starpu_Europar,
    author = {C{\'e}dric Augonnet and Samuel Thibault and Raymond Namyst and Pierre-Andr{\'e} Wacrenier},
    title = {{StarPU: A Unified Platform for Task Scheduling on Heterogeneous Multicore Architectures}},
    booktitle = {Proceedings of the 15th International Euro-Par Conference},
    year = 2009
}

@inproceedings{scheduling_anand_ics11,
    author = {Jacques A. Pienaar and Anand Raghunathan and Srimat Chakradhar},
    title = {{MDR: Performance Model Driven Runtime for Heterogeneous Parallel Platforms}},
    booktitle = {Proceedings of International Conference on Supercomputing},
    year = 2011
}

@inproceedings{qilin_micro09,
    title = {{Qilin: Exploiting Parallelism on Heterogeneous Multiprocessors with Adaptive Mapping}},
    author = {Chi-Keung Luk and Sunpyo Hong and Hyesoon Kim},
    booktitle = {International Symposium on Microarchitecture},
    year = 2009
}

@inproceedings{ocelot_pact09,
    title = {{Ocelot: a Dynamic Optimization Framework for Bulk-synchronous Applications in Heterogeneous Systems}},
    author = {Gregory Diamos and Andrew Kerr and Sudhakar Yalamanchili and Nathan Clark},
    booktitle = {International Conference on Parallel Architecture and Compilation Techniques},
    year = 2010
}

@inproceedings{thrifty_interconnect_ibm,
    title = {{Power Shifting in Thrifty Interconnection Network}},
    author = {Jian Li and Wei Huang and Charles Lefurgy and Lixin Zhang and Wolfgang E. Denzel and Richard R. Treumann and Kun Wang},
    booktitle = {International Symposium on High Performance Computer Architecture },
    year = 2011
}

@inproceedings{cpumiser_icpp07,
    title = {{CPU MISER: A Performance-Directed, Run-Time System for Power-Aware Clusters}},
    author = {Rong Ge and Xizhou Feng and Wu-chun Feng and Kirk Cameron},
    booktitle = {International Conference on Parallel Processing},
    year = 2007
}

@inproceedings{mem_power_page_alloc,
    title = {{ Power Aware Page Allocation}},
    author = {Alvin R. Lebeck and Xiaobo Fan and Heng Zeng and Carla Schlatter Ellis},
    booktitle = {International Conference on Architectural Support for Programming Languages and Operating Systems},
    year = 2000
}

@INPROCEEDINGS{Economou06full-systempower,
    author = {Dimitris Economou and Suzanne Rivoire and Christos Kozyrakis},
    title = {{Full-System Power Analysis and Modeling for Server Environments}},
    booktitle = {Workshop on Modeling Benchmarking and Simulation},
    year = {2006}
}

@inproceedings{tao:sigmetrics03,
    author    = {Tao Li and Lizy Kurian John},
    title     = {{Run-Time Modeling and Estimation of Operating System Power Consumption}},
    booktitle = {SIGMETRICS},
    year      = {2003},
    pages     = {160-171},
}

@INPROCEEDINGS{Heath05,
    author = {Taliver Heath and Bruno Diniz and Enrique V. Carrera and Wagner Meira Jr and Ricardo Bianchini},
    title = {{Energy Conservation in Heterogeneous Server Clusters}},
    booktitle = {Proceedings of Symposium on Principles and Practice of Parallel Programming},
    year = {2005}
}

@inproceedings{qureshi:isca09,
    author = {M. K. Qureshi and V. Srinivasan and J. A. Rivers},
    title = {{Scalable High Performance Main Memory System Using Phase-Change Memory Technology}},
    booktitle = {Proceedings of the Internationl Symposium on Computer Architecture},
    year = {2009}
}

@inproceedings{zhou:isca,
    author = {P. Zhou and B. Zhao and J. Yang and Y. Zhang},
    title = {{Exploring Phase Change Memory and 3D Die-Stacking for Power/Thermal Friendly, Fast and Durable Memory Architecture}},
    booktitle = {International Symposium on Computer Architecture},
    year = 2009
}

@inproceedings{zhang:pact09,
    author = {W. Zhang and T. Li},
    title = {{Exploring Phase Change Memory and 3D Die-Stacking for Power/Thermal Friendly, Fast and Durable Memory Architecture}},
    booktitle = {International Conference on Parallel Architecture and Compilation Techniques},
    year = {2009}
}

@inproceedings{Ramos:ics11,
    author     = {Luiz Ramos and Eugene Gorbatov and Ricardo Bianchini},
    title      = {{Page Placement in Hybrid Memory Systems}},
    booktitle  = {Proceedings of the International Conference on Supercomputing},
    year       = {2011}
}

@article{murph_toc,
    author = "R. Murphy and P. Kogge",
    title = {{On the Memory Access Patterns of Supercomputer Applications: Benchmark Selection and Its Implications}},
    journal="IEEE Transaction on Computers",
    volume="56",
    number="7",
    year={2007}
}

@techreport{row_buffer_hybrid,
    author = {HanBin Yoon and Justin Meza and Rachata Ausavarungnirun and Rachael Harding and Onur Mutlu},
    title = {{DynRBLA: A High-Performance and Energy-Efficient Row Buffer Locality-Aware Caching Policy for Hybrid Memorie}},
    type = {{R}esearch {R}eport},
    institution = {Computer Architecture Lab (CALCM), Carnegie Mellon University},
    number = {2011-005},
    year = {2011},
    URL = {http://www.ece.cmu.edu/~safari/tr/tr-2011-005-3.pdf}
}



@inproceedings{hybridmem_dac,
    author     = {Gaurav Dhiman and Raid Ayoub and Tajana Rosing},
    title      = {{PDRAM: A Hybrid PRAM and DRAM Main Memory System}},
    booktitle  = {Design Automation Conference},
    year       = {2009}
}

@inproceedings{dong_nvm_pattern,
    author = {Dong Li and Jeffrey Vetter and Gabriel Marin and Collin McCurdy and Cristian Cira and Zhuo Liu and Weikuan Yu},
    title = {{An Analysis of Scienti�c Applications for Using Non-Volatile Memory in High Performance Computing}},
    booktitle  = {Proceedings of International Parallel and Distributed Processing Symposium},
    year       = {2012}
}

@inproceedings{zhang:pact,
    author = {W. Zhang and T. Li},
    title = {{Exploring Phase Change Memory and 3D Die-Stacking for Power/Thermal Friendly, Fast and Durable Memory Architecture}},
    booktitle = {International Conference on Parallel Architecture and Compilation Techniques},
    year = {2009}
}

@article{dramsim2,
    author    = {Paul Rosenfeld and Elliott Cooper-Balis and Bruce Jacob},
    title     = {{DRAMSim2: A Cycle Accurate Memory System Simulator}},
    journal   = {{ IEEE COMPUTER ARCHITECTURE LETTER}},
    volume="10",
    number="1",
    year={2011},
}

@inproceedings{gpgpusim,
    author = {Ali Bakhoda and George L. Yuan and Wilson W. L. Fung and Henry Wong and Tor M. Aamodt},
    title = {{Analyzing CUDA Workloads Using a Detailed GPU  Simulator}},
    booktitle = {Proceedings of International Symposium on Performance Analysis of Systems and Software},
    year = 2009
}

@inproceedings{pintool,
    author = {Chi-Keung Luk and Robert Cohn and Robert Muth and Harish Patil and Artur Klauser and Geoff Lowney and Steven Wallace and Vijay Janapa Reddi and Kim Hazelwood},
    title = {{Pin: Building Customized Program Analysis Tools with Dynamic Instrumentation}},
    booktitle = {Proceedings of SIGPLAN conference on Programming language design and implementation},
    year = 2005
}

@inproceedings{wu_apu,
    author = {Mayank Daga and Ashwin Aji and Wu-chun Feng},
    title = {{On the Efficacy of a Fused CPU+GPU Processor for Parallel Computing }},
    booktitle = {Proceedings of the Symposium on Application Accelerators in High-Performance Computing},
    year = 2011
}
 @inproceedings{ cuda_to_opencl,
    author  =   {Gabriel Martinez and Mark Gardner and Wu-chun Feng},
    title   =   {{CU2CL: A CUDA-to-OpenCL Translator for Multi- and Many-Core Architectures}},
    booktitle   =   {Proceedings of the 17th IEEE International Conference on Parallel and Distributed Systems},
    year    =   {2011}
}

@inproceedings{ darpa_report,
    author  =   {Jack Dongarra and Robert Graybill and William Harrod and Bob Lucas and Ewing Lusk and Piotr Luszczek and Janice McMahon and Allan Snavely and Jeffery Vetter and Katherine Yelick and Sadaf Alam and Roy Campbell and Laura Carrington and Tzu-Yi Chen and Omid Khalili and Jeremy Meredith and Mustafa Tikir},
    title   =   {{ DARPR��sHPCS program: History, models, tools, languages}},
    booktitle   =  {Advances in Computers},
    volume  =   {72},
    year    =   2008
}

@techreport{darpa_report_2,
    author  =   {   Peter Kogge and Keren Bergman and Shekhar Borkar and Dan Campbell and William Carlson and
                    William Dally and Monty Denneau and Paul Franzon and William Harrod and Kerry Hill and
                    Jon Hiller and Sherman Karp and Stephen Keckler and Dean Klein and Robert Lucas and Mark Richards and Al Scarpelli and
                    Steven Scott and Allan Snavely and Thomas Sterling and R. Stanley Williams and Katherine Yelick},
    title   = {{ Exascale Computing Study: Technology Challenges in Achieving Exascale Systems}},
    type    = { Technical report},
    institution =   {DARPA Information Processing Techniques Office},
    year    =   2008
}

@techreport{model_simu_report_exascale,
    author  =   {Horst Simon and Thomas Zacharia and Rick Stevens},
    title   =   {{ Modeling and Simulation at the Exascale for Energy and the Environment}},
    institution =   { US Department of Energy},
    year    =   2007
}

@techreport{ doe_report,
    author  =   {Jeffrey S. Vetter and Fred Johnson and Thuc Hoang and Bronis de Supinski and Bart Miller and Mary Zosel and
                    Susan Coghlan and Al Geist and Jeffrey Hollingsworth and Curtis Janssen and Bernd Mohr and Rod Oldehoeft and
                    Craig Rasmussen and Daniel Reed},
    title   =   {{ Report from the Workshop on Software Development Tools for Petascale Computing (SDTPC)}},
    type    =   {Technical report},
    institution =   { US Department of Energy},
    year    =   2007
}

@article{ tsubame_2.0,
    author  =   {S. Matsuoka},
    title   =   {{ The Tsubame Cluster Experience a Year Later, and onto Petascale Tsubame 2.0}},
    journal   =   { LECTURE NOTES IN COMPUTER SCIENCE},
    volume  = {4757},
    number  =   {8},
    year    =   2007
}

@article{ tsubame_report,
    author  =   {S. Matsuoka and T. Aoki and T. Endo and A. Nukada and T. Kato and A. Hasegawa},
    title   =   {{ GPU Accelerated Computing from Hype to Mainstream}},
    journal =   { the rebirth of vector computing},
    volume  =   {180},
    pages   =   {012043},
    year    =   2009
}


@booklet{tianhe,
    author  =   {TOP500},
    title   =   {{ Tianhe-1, China��s First Petaflop/s Scale Supercomputer}},
    year    =   2009
}

@article{powerpack,
 author = {Ge, Rong and Feng, Xizhou and Song, Shuaiwen and Chang, Hung-Ching and Li, Dong and Cameron, Kirk W.},
 title = {PowerPack: Energy Profiling and Analysis of High-Performance Systems and Applications},
 journal = {IEEE Trans. Parallel Distrib. Syst.},
 issue_date = {May 2010},
 volume = {21},
 number = {5},
 month = may,
 year = {2010},
 issn = {1045-9219},
 pages = {658--671},
 numpages = {14},
 url = {http://dx.doi.org/10.1109/TPDS.2009.76},
 doi = {10.1109/TPDS.2009.76},
 acmid = {1804138},
 publisher = {IEEE Press},
 address = {Piscataway, NJ, USA},
 keywords = {CMP-based cluster, Distributed system, Distributed system, CMP-based cluster, energy efficiency, power measurement, system tools, power management, dynamic voltage and frequency scaling., dynamic voltage and frequency scaling., energy efficiency, power management, power measurement, system tools},
} 

@inproceedings{ arch_mapping_opencl,
    author  =   {Mayank Daga and Tom Scogland and Wu-chun Feng},
    title   =   {{ Architecture-Aware Mapping and Optimization on a 1600-Core GPU}},
    booktitle   =   { Proceedings of the 17th IEEE International Conference on Parallel and Distributed Systems},
    year    =   2011
}

@inproceedings{ streammr,
    author  =   {Marwa Elteir and Heshan Lin and Wu-chun Feng},
    title   =   {{StreamMR: An Optimized MapReduceFramework for AMD GPUs}},
    Booktitle   =   {Proceedings of the 17th IEEE International Conference on Parallel and Distributed Systems },
    year    =   2011
}

@inproceedings{wu_power_model,
    author  =   {Balaji Subramaniam and Wu-chun Feng},
    title   =   {{ Statistical Power and Performance Modeling for Optimizing the Energy Efficiency of Scientific Computing}},
    booktitle   =   { Proceedings of the IEEE/ACM International Conference on Green Computing and Communications (GreenCom)},
    year    =   2010
}

@inproceedings{ wu_gpu_energy,
    author  =   {Song Huang and Shucai Xiao and Wu-chun Feng},
    title   =   {{ On the Energy Efficiency of Graphics Processing Units for Scientific Computing}},
    booktitle   =   { Proceedings of the 5th IEEE Workshop on High-Performance, Power-Aware Computing (in conjunction with the 23rd International Parallel and Distributed Processing Symposium)},
    pages   =   { 3801-3804 },
    year    =   2009
}

@inproceedings{ data_aware_scheduling_spaa10,
    author  =   { M. Becchi and S. Byna and S. Cadambi and S. Chakradhar},
    title   =   {{ Data-Aware Scheduling of Legacy Kernels on Heterogeneous Platforms with Distributed Memory}},
    booktitle   =  {ACM Symposium on Parallelism in Algorithms and Architectures},
    pages   =   {82-91},
    year    =   2010
}

@inproceedings{disk_power_ics04,
author  =   {E. Pinheiro and R. Bianchini},
title   =   {{ Energy Conservation Techniques for Disk Array-Based Servers}},
booktitle   =   { Proceedings of the 18th Annual ACM International Conference on Supercomputing (ICS'04)},
year    =   2004
}



@inproceedings{ dram_power_hpca01,
author  =   {V. Delaluz and  A. Sivasubramaniam and M. Kandemir and N. Vijaykrishnan and M. Irwin},
title   =   {{ DRAM Energy Management Using Software and Hardware Directed Power Mode Control}},
booktitle   =   { In Proceedings Of The Seventh International Symposium On High-Performance Computer Architecture ({HPCA}'01)},
year    = 2001
}

@inproceedings{ dram_power_ispled01,
author  =   {Xiaobo Fan and Carla Ellis and Alvin Lebeck},
title   =   {{ Memory Controller Policies for DRAM Power Management}},
booktitle   =   { Proceedings of the 2001 international symposium on Low power electronics and design (ISLPED)},
year    =   2001
}

@inproceedings{disk_power_ieee_computer,
        title   =   {{Reducing Disk Power Consumption in Servers with DRPM}},
        author  =   {S. Gurumurthi and A. Sivasubramaniam and M. Kandemir and H. Franke},
        booktitle   =   {IEEE Computer Special Issue on Power-Aware and Temperature-Aware Computing, Special Issue on Power and Temperature-Aware Computing},
        volume  =   {36},
        number  =   {12},
        pages   =   {59-66},
        year    =   {2003}
}

@inproceedings{cache_power_tecs,
    title   =   {{Adaptive Mode Control: A Static-power-efficient Cache Design}},
    author  =   {Huiyang Zhou and Mark C. Toburen and Eric Rotenberg and Thomas M. Conte},
    booktitle   =   {ACM Transactions on Embedded Computing Systems (TECS)},
    volume  =   {2},
    number  =   {3},
    year    =   {2003}
}

@techreport{ecacti,
    title   = {{eCACTI: An Enhanced Power Estimation Model for On-chip Caches}},
    author  =  {Mahesh Mamidipaka and Nikil Dutt },
    type    = {Technical Report TR-04-28},
    institution   = { CECS, University of California Irvine},
    year    = 2004
}

@article{ DBMA11,
  author    = {Jack Dongarra and Peter H. Beckman and Terry Moore etc. },
  title     = {The International Exascale Software Project roadmap},
  journal   = {IJHPCA},
  volume    = {25},
  number    = {1},
  year      = {2011},
  pages     = {3-60},
}

@article{DOSW09,
  author    = {David Donofrio and
               Leonid Oliker and
               John Shalf and
               Michael F. Wehner and
               Chris Rowen and
               Jens Krueger and
               Shoaib Kamil and
               Marghoob Mohiyuddin},
  title     = {Energy-Efficient Computing for Extreme-Scale Science},
  journal   = {IEEE Computer},
  volume    = {42},
  number    = {11},
  year      = {2009},
  pages     = {62-71},
}

@article{LMFS11,
  author    = {Heshan Lin and
               Xiaosong Ma and
               Wu-chun Feng and
               Nagiza F. Samatova},
  title     = {{Coordinating Computation and I/O in Massively Parallel Sequence
               Search}},
  journal   = {IEEE Trans. Parallel Distrib. Syst.},
  volume    = {22},
  number    = {4},
  year      = {2011},
  pages     = {529-543},
  ee        = {http://doi.ieeecomputersociety.org/10.1109/TPDS.2010.101},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{SACC09,
    title={{ExaScale Software Study : Software Challenges in Extreme Scale Systems}},
    journal={ExaScale Computing Study},
    author={Vivek Sarkar and Saman Amarasinghe and Dan Campbell etc.},
    year={2009},
    pages={1--159},
    publisher = {DARPA IPTO}
}

@techreport{Brya07,
    author = {Randal E. Bryant},
    title = {{Data-Intensive Supercomputing: The Case for DISC}},
    type    =   {Tech Report CMU-CS-07-128},
    institution = {Carnegie Mellon University School of Computer Science},
    year = {2007}
}

@booklet{PVFS2Dev,
    title = {{PVFS2 Development Team. PVFS Developer's Guide}},
    howpublished = "\url{http://www.pvfs.org/cvs/pvfs-2-8-branch-docs/doc//pvfs2-guide.pdf.}"
}

@booklet{DICI,
    title = {{Data-Intensive Computing Initiative}},
    howpublished = "\url{http://dicomputing.pnl.gov/}"
}

@booklet{GTC,
    title   = {{Gyrokinetic Particle Simulations Gyrokinetic Toroidal Code (GTC)}},
    howpublished    = "\url{http://w3.pppl.gov/theory/proj_gksim.html}"
}

@booklet{Jaguar,
    title   = {{Jaguar supercomputer at the Oak Ridge Leadership Computing Facility of Oak Ridge National Laboratory}},
    howpublished    = "\url{http://www.olcf.ornl.gov/computing-resources/jaguar/}"
}

@booklet{INCITE,
    title   = {{DOE Innovative and Novel Computational Impact on Theory and Experiment Program}},
    howpublished    = "\url{http://hpc.science.doe.gov/}"
}

@inproceedings{ShDM10,
  author    = {John Shalf and Sudip S. Dosanjh and John Morrison},
  title     = {{Exascale Computing Technology Challenges}},
  booktitle = {VECPAR},
  year      = {2010},
  pages     = {1-25}
}


@inproceedings{VTYR08,
  author = {Jeffrey S. Vetter  and Vinod, Tipparaju  and Weikuan Yu and Philip C. Roth},
  booktitle = {High Performance Computing Workshop},
  pages = {95-106},
  title = {{HPC Interconnection Networks: The Key to Exascale Computing}},
  volume = 18,
  year = 2008
}

@inproceedings{LPGK11,
 author = {Lofstead, Jay and Polte, Milo and Gibson, Garth and Klasky, Scott and Schwan, Karsten and Oldfield, Ron and Wolf, Matthew and Liu, Qing},
 title = {{Six Degrees of Scientific Data: Reading Patterns for Extreme Scale Science IO}},
 booktitle = {Proceedings of the 20th international symposium on High performance distributed computing},
 year = {2011},
 location = {San Jose, California, USA},
 pages = {49--60}
}

@article{ABBD10,
  author    = {Ken Alvin and
               Brian Barrett and
               Ron Brightwell and
               Sudip S. Dosanjh and
               Al Geist and
               K. Scott Hemmert and
               Michael A. Heroux and
               Doug Kothe and
               Richard C. Murphy and
               Jeff Nichols and
               Ron Oldfield and
               Arun Rodrigues and
               Jeffrey S. Vetter},
  title     = {{On the Path to Exascale}},
  journal   = {IJDST},
  volume    = {1},
  number    = {2},
  year      = {2010},
  pages     = {1-22}
}

@inproceedings{BBFG09,
    author  =   {{M. Bancroft and J. Bent and E. Felix and G. Grider and J. Nunez and S. Poole and R. Ross and E. Salmon and L. Ward }},
    title   =   {{ HEC FSIO 2008 Workshop Report}},
    booktitle = { High End Computing Interagency Working Group (HECIWG) Sponsored File Systems and I/O Workshop HEC FSIO },
    year    =   2009
}

@inproceedings{BCST08,
    author = {Byna, Surendra and Chen, Yong and Sun, Xian-He and Thakur, Rajeev and Gropp, William},
    title = {{Parallel I/O Prefetching Using MPI File Caching and I/O Signatures}},
    booktitle = {Proceedings of the 2008 ACM/IEEE conference on Supercomputing},
    year = {2008}
    }

@inproceedings{CBST08,
    author={Yong Chen and Byna, S. and Xian-He Sun and Thakur, R. and Gropp, W.},
    booktitle={Parallel Processing, 2008. ICPP '08. 37th International Conference on},
    title={{Exploring Parallel I/O Concurrency with Speculative Prefetching}},
    year={2008},
}

@inproceedings{CBST08a,
 author = {Chen, Yong and Byna, Surendra and Sun, Xian-He and Thakur, Rajeev and Gropp, William},
 title = {{Hiding I/O Latency with Pre-execution Prefetching for Parallel Applications}},
 booktitle = {Proceedings of the 2008 ACM/IEEE conference on Supercomputing},
 series = {SC '08},
 year = {2008},
 location = {Austin, Texas},
 pages = {40:1--40:10},
}

@inproceedings{ChRo10,
author={Yong Chen and Roth, P.C.},
booktitle={Petascale Data Storage Workshop (PDSW), 2010 5th},
title={{Collective Prefetching for Parallel I/O Systems}},
year={2010},
pages={1 -5}
}


@inproceedings{CSTR11,
author={Yong Chen and Xian-He Sun and Thakur, R. and Roth, P.C. and Gropp, W.D.},
booktitle={Parallel Distributed Processing Symposium (IPDPS), 2011 IEEE International},
title={{LACIO: A New Collective I/O Strategy for Parallel I/O Systems}},
year={2011},
pages={794 -804}
}


@inproceedings{CSTS10,
author={Yong Chen and Xian-He Sun and Thakur, R. and Huaiming Song and Hui Jin},
booktitle={Cluster Computing (CLUSTER), 2010 IEEE International Conference on},
title={{Improving Parallel I/O Performance with Data Layout Awareness}},
year={2010},
pages={302 -311}
}

@article{ChSW08,
 author = {Chen, Yong and Sun, Xian-He and Wu, Ming},
 title = {{Algorithm-system Scalability of Heterogeneous Computing}},
 journal = {Journal of Parallel and Distributed Computing (JPDC)},
 volume = {68},
 year = {2008},
 pages = {1403--1412},
}


@INPROCEEDINGS{JiCS10,
author={Hui Jin and Yong Chen and Huaiyu Zhu and Xian-He Sun},
booktitle={Parallel Processing (ICPP), 2010 39th International Conference on},
title={{Optimizing HPC Fault-Tolerant Environment: An Analytical Approach}},
year={2010},
pages={525 -534}
}
@inproceedings{SYCS11,
  author    = {Huaiming Song and
               Yanlong Yin and
               Yong Chen and
               Xian-He Sun},
  title     = {{A Cost-Based Application-Specific Data Layout Scheme for Parallel File Systems}},
  booktitle = {The 20th International Symposium on High Performance Distributed Computing (HPDC'11)},
  year      = {2011},
  pages     = {37-48},
}

@inproceedings{SuCY09,
  author    = {Xian-He Sun and
               Yong Chen and
               Yanlong Yin},
  title     = {{Data Layout Optimization for Petascale File Systems}},
  booktitle = {The 4th Petascale Data Storage Workshop (PDSW'09)},
  year      = {2009},
  pages     = {1-5},
}

@inproceedings{APWD08,
 author = {Agrawal, Nitin and Prabhakaran, Vijayan and Wobber, Ted and Davis, John D. and Manasse, Mark and Panigrahy, Rina},
 title = {{Design Tradeoffs for SSD Performance}},
 booktitle = {USENIX 2008 Annual Technical Conference on Annual Technical Conference},
 year = {2008},
 location = {Boston, Massachusetts},
 pages = {57--70},
}


@inproceedings{DoXi11,
  author    = {Xiangyu Dong and Yuan Xie},
  title     = {{AdaMS: Adaptive MLC/SLC Phase-change Memory Design for File Storage}},
  booktitle = {ASP-DAC},
  year      = {2011},
  pages     = {31-36},
}


@inproceedings{LIMB09,
 author = {Lee, Benjamin C. and Ipek, Engin and Mutlu, Onur and Burger, Doug},
 title = {{Architecting Phase Change Memory as a Scalable DRAM Alternative}},
 booktitle = {Proceedings of the 36th annual international symposium on Computer architecture},
 series = {ISCA '09},
 year = {2009},
 location = {Austin, TX, USA},
 pages = {2--13}
}


@inproceedings{ChKZ11,
  author    = {Feng Chen and David A. Koufaty and Xiaodong Zhang},
  title     = {{Hystor: Making the Best Use of Solid State Drives in High Performance Storage Systems}},
  booktitle = {ICS},
  year      = {2011},
  pages     = {22-32}
}

@inproceedings{ACIK09,
  author    = {Nawab Ali and Philip H. Carns and Kamil Iskra etc.},
  title     = {{Scalable I/O Forwarding Framework for High-performance Computing Systems}},
  booktitle = {CLUSTER},
  year      = {2009},
}


@inproceedings{IRYB08,
    title = {{ZOID: I/O-forwarding Infrastructure for Petascale Architectures}},
    author = {Iskra, Kamil and Romein, John W. and Yoshii, Kazutomo and Beckman, Pete},
    booktitle = {PPoPP},
    year = {2008}
}


@inproceedings{VHIK10,
    title = {{Accelerating {I/O} Forwarding in {IBM} Blue {Gene/P} Systems}},
    author = {Vishwanath, Venkatram and Hereld, Mark and Iskra, Kamil and Kimpe, Dries and Morozov, Vitali and Papka, Michael E. and Ross, Robert and Yoshii, Kazutomo},
    booktitle = {Proceedings of International Conference for High Performance Computing, Networking, Storage and Analysis (SC10)},
    pages = {1--10},
    year = {2010}
}

@inproceedings{ScHa02,
 author = {Schmuck, Frank and Haskin, Roger},
 title = {{GPFS: A Shared-Disk File System for Large Computing Clusters}},
 booktitle = {Proceedings of the 1st USENIX Conference on File and Storage Technologies},
 year = {2002}
}


@inproceedings{PTHJ01,
 author = {Prost, Jean-Pierre and Treumann, Richard and Hedges, Richard and Jia, Bin and Koniges, Alice},
 title = {{MPI-IO/GPFS, an Optimized Implementation of MPI-IO on Top of GPFS}},
 booktitle = {Proceedings of the 2001 ACM/IEEE conference on Supercomputing (CDROM)},
 series = {Supercomputing '01},
 year = {2001},
 pages = {17--17},
}


@inproceedings{RiGF98,
 author = {Riedel, Erik and Gibson, Garth A. and Faloutsos, Christos},
 title = {{Active Storage for Large-Scale Data Mining and Multimedia}},
 booktitle = {Proceedings of the 24rd International Conference on Very Large Data Bases},
 series = {VLDB '98},
 year = {1998},
}

@article{MaRe03,
  author    = {Xiaonan Ma and A. L. Narasimha Reddy},
  title     = {MVSS: An Active Storage Architecture},
  journal   = {IEEE Transactions On Parallel and Distributed Systems},
  volume    = {14},
  number    = {10},
  year      = {2003},
  pages     = {993-1005},
}

@inproceedings{WSPR10,
 author = {Son, Seung Woo and Lang, Samuel and Carns, Philip etc.},
 title = {{Enabling Active Storage on Parallel I/O Software Stacks}},
 booktitle = {Proceedings of the 2010 IEEE 26th Symposium on Mass Storage Systems and Technologies (MSST)},
 series = {MSST '10},
 year = {2010},
 pages = {1--12},
}

@inproceedings{RiTh08,
  author = {Rich, Brandon and Thain, Douglas},
  booktitle = {HPDC},
  title = {{DataLab: Transactional Data-parallel Computing on an Active Storage Cloud}},
  year = 2008
}

@inproceedings{SLCR10,
author={Seung Woo Son and Lang, S. and Carns, P. and Ross, R. and Thakur, R. and Ozisikyilmaz, B. and Kumar, P. and Wei-Keng Liao and Choudhary, A.},
booktitle={Mass Storage Systems and Technologies (MSST), 2010 IEEE 26th Symposium on},
title={{Enabling Active Storage on Parallel I/O Software Stacks}},
year={2010}
}

@inproceedings{XMFL11,
  author       = {Yulai Xie and Kiran-Kumar Muniswamy-Reddy and Dan Feng etc.},
  title        = {{Design and Evaluation of Oasis: An Active Storage Framework based on T10 OSD Standard}},
  booktitle    = {MSST},
  year         = {2011}
}

@inproceedings{AcUS98,
    author = {Acharya, Anurag and Uysal, Mustafa and Saltz, Joel},
    booktitle = {Proceedings of the 8th International Conference on Architectural Support for Programming Languages and Operating Systems},
    pages = {81--91},
    title = {{Active Disks: Programming Model, Algorithms and Evaluation}},
    volume = {33},
    year = {1998}
}

@inproceedings{ChMa02,
 author = {Chockler, Gregory and Malkhi, Dahlia},
 title = {{Active Disk Paxos with Infinitely Many Processes}},
 booktitle = {Processing of the 21th Annual Symposium on Principles of Distributed Computing},
 volume = {18},
 year = {2005},
 pages = {73--84}
}

@inproceedings{UyAS00,
    author = {Mustafa Uysal and Anurag Acharya and Joel Saltz},
    title = {{Evaluation of Active Disks for Decision Support Databases}},
    booktitle = {Proceedings of the International Symposium on High-performance Computer Architecture},
    year = {2000},
    pages = {337--348},
}


@inproceedings{LKWD01,
 author = {Lim, Hyeran and Kapoor, Vikram and Wighe, Chirag and Du, David H.-C.},
 title = {Active Disk File System: A Distributed, Scalable File System},
 booktitle = {Proceedings of the 8th IEEE Symposium on Mass Storage Systems and Technologies},
 series = {MSST'01},
 year = {2001},
}


@article{KePH98,
 author = {Keeton, Kimberly and Patterson, David A. and Hellerstein, Joseph M.},
 title = {{A Case for Intelligent Disks (IDISKs)}},
 journal = {ACM SIGMOD Record},
 volume = {27},
 year = {1998},
 pages = {42--52},
}


@inproceedings{MeKC00,
 author = {Memik, Gokhan and Choudhary, Alok and Kandemir, Mahmut T.},
 title = {{Design and Evaluation of Smart Disk Architecture for DSS Commercial Workloads}},
 booktitle = {Proceedings of the Proceedings of the 2000 International Conference on Parallel Processing},
 series = {ICPP '00},
 year = {2000},
 pages = {335--},
}

@inproceedings{SPPD03,
    author = {Sivathanu, Muthian and Prabhakaran, Vijayan and Popovici, Florentina I. and Denehy, Timothy E. and Arpaci-Dusseau, Andrea C. and Arpaci-Dusseau, Remzi H.},
    booktitle = {Proceedings of the Second USENIX Symposium on File and Storage Technologies (FAST '03)},
    title = {{Semantically-Smart Disk Systems}},
    year = {2003},
}

@inproceedings{ChLC03,
 author = {Chiu, Steve and Liao, Wei-keng and Choudhary, Alok},
 title = {{Design and Evaluation of Distributed Smart Disk Architecture for I/O-intensive Workloads}},
 booktitle = {Proceedings of the 2003 International Conference on Computational Science},
 series = {ICCS'03},
 year = {2003},
 pages = {230--241}
}


@inproceedings{EHHN10,
  author    = {Marc Eshel and Roger L. Haskin and Dean Hildebrand and Manoj Naik and Frank B. Schmuck and Renu Tewari},
  title     = {{Panache: A Parallel File System Cache for Global File Access}},
  booktitle = {FAST},
  year      = {2010},
  pages     = {155-168},
}

@article{WYMG09,
 author = {Wang, Jun and Yao, Xiaoyu and Mitchell, Christopher and Gu, Peng},
 title = {{A New Hierarchical Data Cache Architecture for iSCSI Storage Server}},
 journal = {IEEE Transaction on Computers},
 volume = {58},
 year = {2009},
 pages = {433--447},
}

@inproceedings{AWEK10,
 author = {Abbasi, Hasan and Wolf, Matthew and Eisenhauer, Greg etc.},
 title = {{DataStager: Scalable Data Staging Services for Petascale Applications}},
 booktitle = {HPDC},
 year = {2009}
}

@inproceedings{AEWS11,
  author    = {Hasan Abbasi and Greg Eisenhauer and Matthew Wolf and Karsten Schwan and Scott Klasky},
  title     = {{Just in time: Adding Value to the IO Pipelines of High Performance Applications with JITStaging}},
  booktitle = {HPDC},
  year      = {2011},
  pages     = {27-36}
}


@inproceedings{GuWR08,
 author = {Gu, Peng and Wang, Jun and Ross, Robert},
 title = {{Bridging the Gap Between Parallel File Systems and Local File Systems: A Case Study with PVFS}},
 booktitle = {ICPP},
 year = {2008},
}

@inproceedings{WPBW09,
 author = {Payne, Mary and Widener, Patrick and Wolf, Matthew and Abbasi, Hasan and McManus, Scott and Bridges, Patrick G. and Schwan, Karsten},
 title = {{Exploiting Latent I/O Asynchrony in Petascale Science Applications}},
 booktitle = {Proceedings of the 2008 Fourth IEEE International Conference on eScience},
 year = {2008},
 pages = {410--411},
}

@article{WWAM11,
 author = {Widener, Patrick and Wolf, Matthew and Abbasi, Hasan and Mcmanus, Scott and Payne, Mary and Barrick, Matthew and Pulikottil, Jack and Bridges, Patrick and Schwan, Karsten},
 title = {{Exploiting Latent I/O Asynchrony in Petascale Science Applications}},
 journal = {IJHPCA},
 volume = {25},
 year = {2011},
 pages = {161--179},
}

@inproceedings{BGGM09,
    author = {Bent, John and Gibson, Garth and Grider, Gary and McClelland, Ben and Nowoczynski, Paul and Nunez, James and Polte, Milo and Wingate, Meghan},
    booktitle = {SC '09: Proceedings of the Conference on High Performance Computing Networking, Storage and Analysis},
    pages = {1--12},
    title = {{PLFS: a Checkpoint Filesystem for Parallel Applications}},
    year = {2009}
}

@inproceedings{OWRM06,
  author    = {Ron Oldfield and Lee Ward and Rolf Riesen and Arthur B. Maccabe and Patrick Widener and Todd Kordenbrock},
  title     = {Lightweight I/O for Scientific Applications},
  booktitle = {CLUSTER},
  year      = {2006},
}

@inproceedings{ZhJD09,
  author    = {Xuechen Zhang and
               Song Jiang and
               Kei Davis},
  title     = {Making Resonance a Common Case: A High-performance Implementation of Collective I/O on Parallel File Systems},
  booktitle = {IPDPS},
  year      = {2009},
}

@inproceedings{ZADL10,
  author    = {Fang Zheng and
               Hasan Abbasi and
               Ciprian Docan etc.},
  title     = {PreDatA - Preparatory Data Analytics on Peta-scale Machines},
  booktitle = {IPDPS},
  year      = {2010},
  pages     = {1-12},
}


@inproceedings{LKSP08,
 author = {Lofstead, Jay F. and Klasky, Scott and Schwan, Karsten etc.},
 title = {{Flexible IO and Integration for Scientific Codes through the Adaptable IO System (ADIOS)}},
 booktitle = {Proceedings of the 6th international workshop on Challenges of large applications in distributed environments},
 year = {2008},
}

@inproceedings{LZKS09,
 author = {Lofstead, Jay and Zheng, Fang and Klasky, Scott and Schwan, Karsten},
 title = {{Adaptable, Metadata Rich IO Methods for Portable High Performance IO}},
 booktitle = {Proceedings of the 2009 IEEE International Symposium on Parallel\&Distributed Processing},
 series = {IPDPS '09},
 year = {2009},
 pages = {1--10},
}

@inproceedings{LZLK10,
 author = {Lofstead, Jay and Zheng, Fang and Liu, Qing and Klasky, Scott and Oldfield, Ron and Kordenbrock, Todd and Schwan, Karsten and Wolf, Matthew},
 title = {{Managing Variability in the IO Performance of Petascale Storage Systems}},
 booktitle = {Proceedings of the 2010 ACM/IEEE International Conference for High Performance Computing, Networking, Storage and Analysis},
 series = {SC '10},
 year = {2010},
 pages = {1--12},
}

@inproceedings{LCCC07,
  author    = {Wei-keng Liao and
               Avery Ching and
               Kenin Coloma etc.},
  title     = {{An Implementation and Evaluation of Client-Side File Caching for MPI-IO}},
  booktitle = {IPDPS},
  year      = {2007},
}


@inproceedings{NiLC08,
 author = {Nisar, Arifa and Liao, Wei-keng and Choudhary, Alok},
 title = {{Scaling Parallel I/O Performance through I/O Delegate and Caching System}},
 booktitle = {Proceedings of the 2008 ACM/IEEE conference on Supercomputing},
 series = {SC '08},
 year = {2008},
 pages = {9:1--9:12},
}

@inproceedings{NiLo97,
author = {Bill Nitzberg and Virginia Lo},
title = {{Collective Buffering: Improving Parallel I/O Performance}},
booktitle ={High-Performance Distributed Computing, International Symposium on},
year = {1997},
}

@inproceedings{MWLY02,
  author    = {Xiaosong Ma and
               Marianne Winslett and
               Jonghyun Lee and
               Shengke Yu},
  title     = {{Faster Collective Output through Active Buffering}},
  booktitle = {IPDPS},
  year      = {2002},
}


@article{VSKT06,
 author = {Vilayannur, Murali and Sivasubramaniam, Anand and Kandemir, Mahmut and Thakur, Rajeev and Ross, Robert},
 title = {{Discretionary Caching for I/O on Clusters}},
 journal = {Cluster Computing},
 volume = {9},
 year = {2006},
 issn = {1386-7857},
 pages = {29--44},
}


@article{VSKR03,
 author = {Vilayannur, Murali and Sivasubramaniam, Anand and Kandemir, Mahmut and Thakur, Rajeev and Ross, Robert},
 title = {{Discretionary Caching for I/O on Clusters}},
 journal = {Cluster Computing},
 volume = {9},
 year = {2006},
 issn = {1386-7857},
 pages = {29--44},
}

@inproceedings{RLUW09,
    author  =   {R. Ross and R. Latham and M. Unangst and B. Welch},
    title   =   {{Paralell I/O in Practice}},
    booktitle   = {Tutorial in the ACM/IEEE Supercomputing Conference},
    year    =   2009
}

@inproceedings{TaCh11,
    author  =   {A. Tambi and Y. Chen},
    title   =   {{A Comprehensive Benchmark Suite for Emerging Solid State Drives}},
    booktitle   = {Poster in the 23rd ACM/IEEE Supercomputing Conference (SC'11)},
    year    =   2011
}

@inproceedings{GuCZ11,
    author  =   {{Y. Guvvala, Y. Chen, and Y. Zhuang}},
    title   =   {{Rethinking RAID for SSD based HPC Systems}},
    booktitle   = {Poster in the 23rd ACM/IEEE Supercomputing Conference (SC'11)},
    year    =   2011
}

@inproceedings{pcm_cache_hdd,
    author  =   {Z. Liu and B. Wang and P. Carpenter and  D. Li and J. Vetter and W. Yu},
    title   =   {{PCM-Based Durable Write Cache for Fast Disk I/O}},
    booktitle   = {Submitted to IEEE Conference on Massive Data Storage},
    year    =   2011
}

@inproceedings{PGGS95,
 author = {Patterson, R. H. and Gibson, G. A. and Ginting, E. and Stodolsky, D. and Zelenka, J.},
 title = {{Informed Prefetching and Caching}},
 booktitle = {SOSP},
 year = {1995},
}

@inproceedings{GrAp95,
    author = {James Griffioen and Randy Appleton},
    title = {{Performance Measurements of Automatic Prefetching}},
    booktitle = {In Proceedings of the ISCA International Conference on Parallel and Distributed Computing Systems},
    year = {1995},
    pages = {165--170}
}

@inproceedings{LeDu97,
 author = {Lei, Hui and Duchamp, Dan},
 title = {{An analytical approach to file prefetching}},
 booktitle = {Proceedings of the Annual Conference on USENIX Annual Technical Conference},
 year = {1997},
 pages = {21--21},
}

@inproceedings{HiRe03,
 author = {Highley, Timothy and Reynolds, Paul},
 title = {{Marginal Cost-Benefit Analysis for Predictive File Prefetching}},
 booktitle = {Proceedings of the 41st Anuual ACM Southeast Conference (ACMSE 2003)},
 year = {2003},
}

@article{TrRe04,
 author = {Tran, Nancy and Reed, Daniel A.},
 title = {{Automatic ARIMA Time Series Modeling for Adaptive I/O Prefetching}},
 journal = {IEEE Transactions on Parallel and Distribted Systems},
 volume = {15},
 year = {2004},
 pages = {362--377},
}


@inproceedings{ChGi99,
 author = {Chang, Fay and Gibson, Garth A.},
 title = {{Automatic I/O Hint Generation Through Speculative Execution}},
 booktitle = {Proceedings of the 3rd Symposium on Operating SystemsDesign and Implementation},
 series = {OSDI '99},
 year = {1999},
 pages = {1--14},
}

@inproceedings{YaMC02,
 author = {Yang, Chuan-Kai and Mitra, Tulika and Chiueh, Tzi-cker},
 title = {{A Decoupled Architecture for Application-Specific File Prefetching}},
 booktitle = {Proceedings of the FREENIX Track: 2002 USENIX Annual Technical Conference},
 year = {2002},
 pages = {157--170},
}

@inproceedings{BICL09,
 author = {Blas, Javier Garc\'{\i}a and Isail\u{a}, Florin and Carretero, J. and Latham, Robert and Ross, Robert},
 title = {{Multiple-Level MPI File Write-Back and Prefetching for Blue Gene Systems}},
 booktitle = {Proceedings of the 16th European PVM/MPI Users' Group Meeting on Recent Advances in Parallel Virtual Machine and Message Passing Interface},
 year = {2009},
 pages = {164--173},
}

@inproceedings{RaBN08,
 author = {Rafique, M. Mustafa and Butt, Ali R. and Nikolopoulos, Dimitrios S.},
 title = {DMA-based Prefetching for I/O-Intensive Workloads on the Cell Architecture},
 booktitle = {Proceedings of the 5th conference on Computing frontiers},
 series = {CF '08},
 year = {2008},
 pages = {23--32},
}

@inproceedings{ZLMZ08,
 author = {Zhang, Zhe and Lee, Kyuhyung and Ma, Xiaosong and Zhou, Yuanyuan},
 title = {{PFC: Transparent Optimization of Existing Prefetching Strategies for Multi-Level Storage Systems}},
 booktitle = {Proceedings of the 2008 The 28th International Conference on Distributed Computing Systems},
 series = {ICDCS '08},
 year   =   {2008},
 pages = {740--751},
}

@booklet{CESM,
    title   = {{Community Earth System Model}},
    howpublished    = "\url{http://www.cesm.ucar.edu}"
}

@booklet{GCRM,
    title   = {{Global Cloud Resolving Model (GCRM)}},
    howpublished    = "\url{https://svn.pnl.gov/gcrm}"
}

@booklet{HNSE,
    title   = {{CeNSE - Central Nervous System for the Earth}},
    howpublished    = "\url{http://www.hpl.hp.com/research/intelligent_infrastructure.html}"
}

@booklet{NEON,
    title   = {{The National Ecological Observatory Network (NEON)}},
    howpublished    = "\url{http://www.neoninc.org}"
}

@article{CLGN09,
 author = {Alok Choudhary and Wei-keng Liao and Kui Gao and Arifa Nisar and Robert Ross and Rajeev Thakur and Robert Latham},
 title = {{Scalable I/O and analytics}},
 journal = {Journal of Physics: Conference Series},
 volume = {180},
 year = {2009},
 doi = {10.1088/1742-6596/180/1/012048},
 masid = {6191428}
}

@inproceedings{DeGh04,
 author = {Jeffrey Dean and Sanjay Ghemawat},
 title = {{MapReduce: Simplied Data Processing on Large Clusters}},
 booktitle = {Operating Systems Design and Implementation},
 year = {2004},
 pages = {137--150},
 masid = {1812573}
}

@inproceedings{ElSm06,
 author = {Tarek A. El-ghazawi and Lauren Smith},
 title = {{UPC: unified parallel C}},
 booktitle = {Supercomputing Conference},
 year = {2006},
 doi = {10.1145/1188455.1188483},
 masid = {2470001}
}

@book{GrLT99,
 author = {Gropp, William and Lusk, Ewing and Thakur, Rajeev},
 title = {Using MPI-2: Advanced Features of the Message-Passing Interface},
 year = {1999},
 isbn = {0262571331},
 publisher = {MIT Press},
 address = {Cambridge, MA, USA},
}

@booklet{HPCC,
    title   = {{High Performance Computing Center}},
    howpublished    = "\url{http://www.hpcc.ttu.edu}"
}

@inproceedings{NiHL94,
 author = {Nieplocha, Jaroslaw and Harrison, Robert J. and Littlefield, Richard J.},
 title = {Global arrays: a portable "shared-memory" programming model for distributed memory computers},
 booktitle = {Proceedings of the 1994 ACM/IEEE conference on Supercomputing},
 series = {Supercomputing '94},
 year = {1994},
}

@techreport{RiGi97,
    author = {Erik Riedel and Garth Gibson},
    title = {Active Disks - Remote Execution for Network-Attached Storage},
    institution = {Carnegie Mellon Univ. },
    year = {1997}
}

@article{RCDG06,
  author = {Won Woo Ro and Stephen P. Crago and Alvin M. Despain and Jean-luc Gaudiot},
  title = {{Design and evaluation of a hierarchical decoupled architecture}},
  journal = {The Journal of Supercomputing},
  volume = {38},
  year = {2006},
  pages = {237--259},
  issue = {3},
  doi = {10.1007/s11227-006-8321-2},
  masid = {2516931}
}

@booklet{PostGIS,
    title   = {{PostGIS}},
    howpublished    = "\url{http://postgis.refractions.net}"
}

@inproceedings{SMWB10,
  author = {Saba Sehrish and Grant Mackey and Jun Wang and John Bent},
  title = {{MRAP: a novel MapReduce-based framework to support HPC analytics applications with access patterns}},
  booktitle = {IEEE International Symposium on High Performance Distributed Computing},
  year = {2010},
  pages = {107--118},
  doi = {10.1145/1851476.1851490},
  masid = {13988525}
}

@booklet{IOSIG,
    title   = {{IOSIG Project}},
    howpublished = "\url{http://www.cs.iit.edu/~scs/iosig}"
}

@article{SuBC07a,
  author = {Xian-he Sun and Surendra Byna and Yong Chen},
  title = {{Server-Based Data Push Architecture for Multi-Processor Environments}},
  journal = {Journal of Computer Science and Technology},
  volume = {22},
  year = {2007},
  pages = {641--652},
  issue = {5},
  doi = {10.1007/s11390-007-9090-y},
  masid = {4397514}
}

@inproceedings{SuBC07b,
  author = {Xian-he Sun and Surendra Byna and Yong Chen},
  title = {{Improving Data Access Performance with Server Push Architecture}},
  booktitle = {International Parallel and Distributed Processing Symposium/International Parallel Processing Symposium},
  year = {2007},
  pages = {1--6},
  doi = {10.1109/IPDPS.2007.370511},
  masid = {2449100}
}

@inproceedings{TSPL11,
 author = {Tantisiriroj, Wittawat and Son, Seung Woo and Patil, Swapnil and Lang, Samuel J. and Gibson, Garth and Ross, Robert B.},
 title = {On the duality of data-intensive file system design: reconciling HDFS and PVFS},
 booktitle = {Proceedings of 2011 International Conference for High Performance Computing, Networking, Storage and Analysis},
 series = {SC '11},
 year = {2011},
 isbn = {978-1-4503-0771-0},
 location = {Seattle, Washington},
 pages = {67:1--67:12},
 articleno = {67},
 numpages = {12},
 url = {http://doi.acm.org/10.1145/2063384.2063474},
 doi = {10.1145/2063384.2063474},
 acmid = {2063474},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {HDFS, Hadoop, PVFS, cloud computing, file systems},
}

@article{TRLG97,
 author = {Rajeev Thakur and Robert Ross and Ewing Lusk and William Gropp},
 title = {{Users Guide for ROMIO: A High-Performance, Portable MPI-IO Implementation}},
 journal = {Mathematics and Computer Science Division},
 year = {1997},
 masid = {402293}
}

@inproceedings{TWAC01,
 author = {Toma, Laura and Wickremesinghe, Rajiv and Arge, Lars and Chase, Jeffery S. and Vitter, Jeffery Scott and Halpin, Patrick N. and Urban, Dean},
 title = {Flow computation on massive grids},
 booktitle = {Proceedings of the 9th ACM international symposium on Advances in geographic information systems},
 series = {GIS '01},
 year = {2001},
}

@inproceedings{YuVe08,
 author = {Yu, Weikuan and Vetter, Jeffrey},
 title = {ParColl: Partitioned Collective I/O on the Cray XT},
 booktitle = {ICPP},
 year = {2008},
}

@article{ZeWa07,
  author =	 {Charles S. Zender},
  title =	 {Analysis of Self-describing Gridded Geoscience Data with {netCDF Operators (NCO)}},
  journal =	 {Environ.\ Modell.\ Softw.},
  key =		 {Zender08},
  year =	 2008,
  volume =	 23,
  number =	 10,
  pages =	 {1338--1342, doi:10.1016/j.envsoft.2008.03.004},
  month =	 {oct},
}

@inproceedings{ThGL99,
 author = {Thakur, Rajeev and Gropp, William and Lusk, Ewing},
 title = {Data Sieving and Collective I/O in ROMIO},
 booktitle = {Proceedings of the The 7th Symposium on the Frontiers of Massively Parallel Computation},
 series = {FRONTIERS '99},
 year = {1999},
 
}

@inproceedings{LiCh08,
 author = {Liao, Wei-keng and Choudhary, Alok},
 title = {Dynamically adapting file domain partitioning methods for collective I/O based on underlying parallel file system locking protocols},
 series = {SC'08},
 year = {2008},
 
}